@article{Li2010,
  title={A contextual-bandit approach to personalized news article recommendation},
  author={Li, Lihong and Chu, Wei and Langford, John and Schapire, Robert E},
  journal={Proceedings of the 19th international conference on World wide web},
  pages={661--670},
  year={2010}
}

@book{Sutton2018,
  title={Reinforcement learning: An introduction},
  author={Sutton, Richard S and Barto, Andrew G},
  year={2018},
  publisher={MIT press}
}

@article{Nemhauser1978,
  title={An analysis of approximations for maximizing submodular set functions—I},
  author={Nemhauser, George L and Wolsey, Laurence A and Fisher, Marshall L},
  journal={Mathematical programming},
  volume={14},
  number={1},
  pages={265--294},
  year={1978}
}

@book{Ross1996,
  title={Stochastic processes},
  author={Ross, Sheldon M},
  year={1996},
  publisher={John Wiley \& Sons}
}

@article{Thompson1933,
  title={On the likelihood that one unknown probability exceeds another in view of the evidence of two samples},
  author={Thompson, William R},
  journal={Biometrika},
  volume={25},
  number={3/4},
  pages={285--294},
  year={1933}
}

@article{Audibert2010,
  title={Regret bounds and minimax policies under partial monitoring},
  author={Audibert, Jean-Yves and Bubeck, S{\'e}bastien},
  journal={Journal of Machine Learning Research},
  volume={11},
  pages={2785--2836},
  year={2010}
}

@book{Boyd2004,
  title={Convex optimization},
  author={Boyd, Stephen and Vandenberghe, Lieven},
  year={2004},
  publisher={Cambridge University Press}
}

@article{Krause2008,
  title={Near-optimal sensor placements in Gaussian processes: Theory, efficient algorithms and empirical studies},
  author={Krause, Andreas and Singh, Amarjeet and Guestrin, Carlos},
  journal={Journal of Machine Learning Research},
  volume={9},
  pages={235--284},
  year={2008}
}

@book{Kleinrock1975,
  title={Queueing systems},
  author={Kleinrock, Leonard},
  volume={1},
  year={1975},
  publisher={Wiley New York}
}

@article{Russo2018,
  title={A tutorial on Thompson sampling},
  author={Russo, Daniel J and Van Roy, Benjamin and Kazerouni, Abbas and Osband, Ian and Wen, Zheng},
  journal={Foundations and Trends in Machine Learning},
  volume={11},
  number={1},
  pages={1--96},
  year={2018}
}

@inproceedings{Agrawal2013,
  title={Thompson sampling for contextual bandits with linear payoffs},
  author={Agrawal, Shipra and Goyal, Navin},
  booktitle={International Conference on Machine Learning},
  pages={127--135},
  year={2013}
}

@book{Cover2006,
  title={Elements of information theory},
  author={Cover, Thomas M and Thomas, Joy A},
  year={2006},
  publisher={John Wiley \& Sons}
}

@article{Srinivas2010,
  title={Gaussian process optimization in the bandit setting: No regret and experimental design},
  author={Srinivas, Niranjan and Krause, Andreas and Kakade, Sham M and Seeger, Matthias W},
  journal={Proceedings of the 27th International Conference on International Conference on Machine Learning},
  pages={1015--1022},
  year={2010}
}

@book{Bertsekas2017,
  title={Dynamic programming and optimal control},
  author={Bertsekas, Dimitri P},
  volume={1},
  year={2017},
  publisher={Athena Scientific}
}

@article{Precup2000,
  title={Eligibility traces for off-policy policy evaluation},
  author={Precup, Doina and Sutton, Richard S and Singh, Satinder P},
  journal={Proceedings of the Seventeenth International Conference on Machine Learning},
  pages={759--766},
  year={2000}
}

@book{Newman2010,
  title={Networks: an introduction},
  author={Newman, Mark},
  year={2010},
  publisher={Oxford University Press}
}

@article{Page1999,
  title={The PageRank citation ranking: Bringing order to the web},
  author={Page, Lawrence and Brin, Sergey and Motwani, Rajeev and Winograd, Terry},
  journal={Stanford InfoLab Technical Report},
  year={1999}
}

@article{Freeman1977,
  title={A set of measures of centrality based on betweenness},
  author={Freeman, Linton C},
  journal={Sociometry},
  pages={35--41},
  year={1977}
}

@book{Cormen2009,
  title={Introduction to algorithms},
  author={Cormen, Thomas H and Leiserson, Charles E and Rivest, Ronald L and Stein, Clifford},
  year={2009},
  publisher={MIT Press}
}

@article{Bengio2003,
  title={A neural probabilistic language model},
  author={Bengio, Yoshua and Ducharme, R{\'e}jean and Vincent, Pascal and Jauvin, Christian},
  journal={Journal of machine learning research},
  volume={3},
  pages={1137--1155},
  year={2003}
}

@article{Vaswani2017,
  title={Attention is all you need},
  author={Vaswani, Ashish and Shazeer, Noam and Parmar, Niki and Uszkoreit, Jakob and Jones, Llion and Gomez, Aidan N and Kaiser, {\L}ukasz and Polosukhin, Illia},
  journal={Advances in neural information processing systems},
  volume={30},
  year={2017}
}

@inproceedings{Chen2021,
  title={Evaluating large language models trained on code},
  author={Chen, Mark and Tworek, Jerry and Jun, Heewoo and Yuan, Qiming and Pinto, Henrique Ponde de Oliveira and Kaplan, Jared and Edwards, Harri and Burda, Yuri and Joseph, Nicholas and Brockman, Greg and others},
  booktitle={arXiv preprint arXiv:2107.03374},
  year={2021}
}

@article{Brown2020,
  title={Language models are few-shot learners},
  author={Brown, Tom and Mann, Benjamin and Ryder, Nick and Subbiah, Melanie and Kaplan, Jared D and Dhariwal, Prafulla and Neelakantan, Arvind and Shyam, Pranav and Saxena, Girish and Sharma, Amanda and others},
  journal={Advances in neural information processing systems},
  volume={33},
  pages={1877--1901},
  year={2020}
}